<!DOCTYPE html>
<html xmlns="http://www.w3.org/1999/xhtml" lang="$lang$" xml:lang="$lang$"$if(dir)$ dir="$dir$"$endif$>
<head>
  <meta charset="utf-8" />
  <meta name="generator" content="pandoc" />
  <meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes" />
  <link rel="shortcut icon" type="image/x-icon" href="favicon.ico">

  <!-- Add Open Graph meta tags for share image -->
  <meta property="og:image" content="https://github.com/natolambert/rlhf-book/blob/main/images/rlhf-book-share" />
  <meta property="og:image:width" content="1920" />
  <meta property="og:image:height" content="1080" />
  
  <!-- <meta property="og:title" content="$if(title-prefix)$$title-prefix$ – $endif$$pagetitle$" /> -->
  <meta property="og:title" content="$if(page-title)$$page-title$$else$$title$$endif$ | RLHF Book by Nathan Lambert" />
  <meta property="og:description" content="The Reinforcement Learning from Human Feedback Book" />
  <meta property="og:url" content="https://rlhfbook.com" />

  $for(author-meta)$
  <meta name="author" content="$author-meta$" />
$endfor$
$if(date-meta)$
  <meta name="dcterms.date" content="$date-meta$" />
$endif$
$if(keywords)$
  <meta name="keywords" content="$for(keywords)$$keywords$$sep$, $endfor$" />
$endif$
  <!-- <title>RLHF Book</title> -->
   <!-- SEO and Open Graph titles -->
   <title>
    $if(page-title)$
      $page-title$ | RLHF Book by Nathan Lambert
    $else$
      $title$ | RLHF Book by Nathan Lambert
    $endif$
  </title>
  
  <style>
    $styles.html()$
    $style.css()$
  </style>
$for(css)$
  <link rel="stylesheet" href="$css$" />
$endfor$
$if(math)$
  $math$
  <style>
    /* Target all possible MathJax display containers */
    .MathJax_Display, .MJXc-display, .math.display, mjx-container[jax="CHTML"][display="true"], mjx-container[jax="SVG"][display="true"] {
      overflow-x: auto;
      max-width: 100%;
      padding: 0.5em 0;
    }
  </style>
$endif$
  <!--[if lt IE 9]>
    <script src="//cdnjs.cloudflare.com/ajax/libs/html5shiv/3.7.3/html5shiv-printshiv.min.js"></script>
  <![endif]-->
$for(header-includes)$
  $header-includes$
$endfor$

<!-- custom js nav -->
<script src="nav.js" defer></script>
<script src="header-anchors.js" defer></script>

</head>
<body>
$for(include-before)$
$include-before$
$endfor$
$if(title)$
<header id="title-block-header">
<h1 class="title"><a href="https://rlhfbook.com/" style="color: inherit; text-decoration: none;">$title$</a></h1>
$if(subtitle)$
<p class="subtitle">$subtitle$</p>
$endif$
$for(author)$
<p class="author">$author$</p>
$endfor$
<navigation-dropdown expanded="false"></navigation-dropdown>

</header>
$endif$
<div> <h3> Chapter Contents </h3> </div>
$if(toc)$
<nav id="$idprefix$TOC" role="doc-toc">
$if(toc-title)$
<h2 id="$idprefix$toc-title">$toc-title$</h2>
$endif$
$table-of-contents$
</nav>
$endif$
<div id="content">
  $body$
</div>

<div id="chapter-navigation" style="display: flex; justify-content: space-between; padding: 2em 0;">
  $if(prev-url)$
  <a href="$prev-url$" class="prev-chapter">
    ← Previous: $prev-chapter$
  </a>
  $else$
  <div></div>
  $endif$
  
  $if(next-url)$
  <a href="$next-url$" class="next-chapter">
    Next: $next-chapter$ →
  </a>
  $endif$
</div>
$for(include-after)$
$include-after$
$endfor$
<footer style="padding: 20px; text-align: center;">
  <hr>
  Citation <br>
  <div style="text-align: left; font-size: small; color: #888;">
    @book{rlhf2024,<br>
    &nbsp;&nbsp;author = {Nathan Lambert},<br>
    &nbsp;&nbsp;title = {Reinforcement Learning from Human Feedback},<br>
    &nbsp;&nbsp;year = {2024},<br>
    &nbsp;&nbsp;publisher = {Online},<br>
    &nbsp;&nbsp;url = {https://rlhfbook.com},<br>      }
  </div>
  <div>
    <a href="https://github.com/natolambert/rlhf-book" target="_blank">
      <img src="https://github.githubassets.com/images/modules/logos_page/GitHub-Mark.png" alt="GitHub" style="width: 40px; height: 40px;">
    </a>
    <!-- Add more social links here -->
  </div>
  <p>&copy; 2024 RLHF Book Team</p>
</footer>
</body>
</html>